package top.jolyoulu.core.rdd.operator.transform

import org.apache.spark.rdd.RDD
import org.apache.spark.{SparkConf, SparkContext}

/**
 * @Author: JolyouLu
 * @Date: 2024/2/7 20:51
 * @Description
 */
object Spark01_RDD_Operator_Map2 {
  def main(args: Array[String]): Unit = {
    //准备环境 [*]:表示使用当前系统最大核
    val sparkConf: SparkConf = new SparkConf().setMaster("local[*]").setAppName("RDD")
    val sc: SparkContext = new SparkContext(sparkConf)

    val path: String = this.getClass.getClassLoader.getResource("datas/apache.log").toURI.getPath
    val logRDD: RDD[String] = sc.textFile(path)

    val urlRDD: RDD[String] = logRDD.map(line => {
      line.split(" ")(6)
    })

    urlRDD.collect().foreach(println)

    //关闭环境
    sc.stop()
  }

}
